edwh-editorjs 2.0.0b1__py3-none-any.whl → 2.0.0b3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
editorjs/__about__.py ADDED
@@ -0,0 +1 @@
1
+ __version__ = "2.0.0-beta.3"
editorjs/__init__.py ADDED
@@ -0,0 +1,5 @@
1
+ from .core import EditorJS
2
+
3
+ __all__ = [
4
+ "EditorJS",
5
+ ]
editorjs/blocks.py ADDED
@@ -0,0 +1,382 @@
1
+ """
2
+ mdast to editorjs
3
+ """
4
+
5
+ import abc
6
+ import re
7
+ import typing as t
8
+
9
+ from .exceptions import TODO
10
+ from .types import EditorChildData, MDChildNode
11
+
12
+
13
+ class EditorJSBlock(abc.ABC):
14
+ @classmethod
15
+ @abc.abstractmethod
16
+ def to_markdown(cls, data: EditorChildData) -> str: ...
17
+
18
+ @classmethod
19
+ @abc.abstractmethod
20
+ def to_json(cls, node: MDChildNode) -> list[dict]: ...
21
+
22
+ @classmethod
23
+ @abc.abstractmethod
24
+ def to_text(cls, node: MDChildNode) -> str: ...
25
+
26
+
27
+ BLOCKS: dict[str, EditorJSBlock] = {}
28
+
29
+
30
+ def block(*names: str):
31
+ def wrapper(cls):
32
+ for name in names:
33
+ BLOCKS[name] = cls
34
+ return cls
35
+
36
+ return wrapper
37
+
38
+
39
+ def process_styled_content(item: MDChildNode, strict: bool = True) -> str:
40
+ """
41
+ Processes styled content (e.g., bold, italic) within a list item.
42
+
43
+ Args:
44
+ item: A ChildNode dictionary representing an inline element or text.
45
+ strict: Raise if 'type' is not one defined in 'html_wrappers'
46
+
47
+ Returns:
48
+ A formatted HTML string based on the item type.
49
+ """
50
+ _type = item.get("type")
51
+ html_wrappers = {
52
+ "text": "{value}",
53
+ "html": "{value}",
54
+ "emphasis": "<i>{value}</i>",
55
+ "strong": "<b>{value}</b>",
56
+ "strongEmphasis": "<b><i>{value}</i></b>",
57
+ "link": '<a href="{url}">{value}</a>',
58
+ "inlineCode": '<code class="inline-code">{value}</code>',
59
+ # todo: <mark>
60
+ }
61
+
62
+ if _type in BLOCKS:
63
+ return BLOCKS[_type].to_text(item)
64
+
65
+ if strict and _type not in html_wrappers:
66
+ raise ValueError(f"Unsupported type {_type} in paragraph")
67
+
68
+ # Process children recursively if they exist, otherwise use the direct value
69
+ if children := item.get("children"):
70
+ value = "".join(process_styled_content(child) for child in children)
71
+ else:
72
+ value = item.get("value", "")
73
+
74
+ template = html_wrappers.get(_type, "{value}")
75
+ return template.format(
76
+ value=value, url=item.get("url", ""), caption=item.get("caption", "")
77
+ )
78
+
79
+
80
+ def default_to_text(node: MDChildNode):
81
+ return "".join(
82
+ process_styled_content(child) for child in node.get("children", [])
83
+ ) or process_styled_content(node)
84
+
85
+
86
+ @block("heading", "header")
87
+ class HeadingBlock(EditorJSBlock):
88
+ @classmethod
89
+ def to_markdown(cls, data: EditorChildData) -> str:
90
+ level = data.get("level", 1)
91
+ text = data.get("text", "")
92
+
93
+ if not (1 <= level <= 6):
94
+ raise ValueError("Header level must be between 1 and 6.")
95
+
96
+ return f"{'#' * level} {text}\n"
97
+
98
+ @classmethod
99
+ def to_json(cls, node: MDChildNode) -> list[dict]:
100
+ """
101
+ Converts a Markdown header block into structured block data.
102
+
103
+ Args:
104
+ node: A RootNode dictionary with 'depth' and 'children'.
105
+
106
+ Returns:
107
+ A ChildNode dictionary representing the header data, or None if no children exist.
108
+
109
+ Raises:
110
+ ValueError: If an unsupported heading depth is provided.
111
+ """
112
+
113
+ depth = node.get("depth")
114
+
115
+ if depth is None or not (1 <= depth <= 6):
116
+ raise ValueError("Heading depth must be between 1 and 6.")
117
+
118
+ return [{"data": {"level": depth, "text": cls.to_text(node)}, "type": "header"}]
119
+
120
+ @classmethod
121
+ def to_text(cls, node: MDChildNode) -> str:
122
+ children = node.get("children", [])
123
+ if children is None or not len(children) == 1:
124
+ raise ValueError("Header block must have exactly one child element")
125
+ child = children[0]
126
+ return child.get("value", "")
127
+
128
+
129
+ @block("paragraph")
130
+ class ParagraphBlock(EditorJSBlock):
131
+ @classmethod
132
+ def to_markdown(cls, data: EditorChildData) -> str:
133
+ text = data.get("text", "")
134
+ return f"{text}\n"
135
+
136
+ @classmethod
137
+ def to_json(cls, node: MDChildNode) -> list[dict]:
138
+ result = []
139
+ current_text = ""
140
+
141
+ for child in node.get("children"):
142
+ _type = child.get("type")
143
+ if _type == "image":
144
+ if current_text:
145
+ result.append({"data": {"text": current_text}, "type": "paragraph"})
146
+ current_text = ""
147
+
148
+ result.extend(ImageBlock.to_json(child))
149
+ else:
150
+ current_text += cls.to_text(child)
151
+
152
+ # final text after image:
153
+ if current_text:
154
+ result.append({"data": {"text": current_text}, "type": "paragraph"})
155
+
156
+ return result
157
+
158
+ @classmethod
159
+ def to_text(cls, node: MDChildNode) -> str:
160
+ return default_to_text(node)
161
+
162
+
163
+ @block("list")
164
+ class ListBlock(EditorJSBlock):
165
+ @classmethod
166
+ def to_markdown(cls, data: EditorChildData) -> str:
167
+ style = data.get("style", "unordered")
168
+ items = data.get("items", [])
169
+
170
+ def parse_items(subitems: list[dict[str, t.Any]], depth: int = 0) -> str:
171
+ markdown_items = []
172
+ for index, item in enumerate(subitems):
173
+ prefix = f"{index + 1}." if style == "ordered" else "-"
174
+ line = f"{'\t' * depth}{prefix} {item['content']}"
175
+ markdown_items.append(line)
176
+
177
+ # Recurse if there are nested items
178
+ if item.get("items"):
179
+ markdown_items.append(parse_items(item["items"], depth + 1))
180
+
181
+ return "\n".join(markdown_items)
182
+
183
+ return "\n" + parse_items(items) + "\n"
184
+
185
+ @classmethod
186
+ def to_json(cls, node: MDChildNode) -> list[dict]:
187
+ """
188
+ Converts a Markdown list block with nested items and styling into structured block data.
189
+
190
+ Args:
191
+ node: A RootNode dictionary with 'ordered' and 'children'.
192
+
193
+ Returns:
194
+ A dictionary representing the structured list data with 'items' and 'style'.
195
+ """
196
+ items = []
197
+ # checklists are not supported (well) by mdast
198
+ # so we detect it ourselves:
199
+ could_be_checklist = True
200
+
201
+ def is_checklist(value: str) -> bool:
202
+ return value.strip().startswith(("[ ]", "[x]"))
203
+
204
+ for child in node["children"]:
205
+ content = ""
206
+ subitems = []
207
+ # child can have content and/or items
208
+ for grandchild in child["children"]:
209
+ _type = grandchild.get("type", "")
210
+ if _type == "paragraph":
211
+ subcontent = ParagraphBlock.to_text(grandchild)
212
+ could_be_checklist = could_be_checklist and is_checklist(subcontent)
213
+ content += "" + subcontent
214
+ elif _type == "list":
215
+ could_be_checklist = False
216
+ subitems.extend(ListBlock.to_json(grandchild)[0]["data"]["items"])
217
+ else:
218
+ raise ValueError(f"Unsupported type {_type} in list")
219
+
220
+ items.append(
221
+ {
222
+ "content": content,
223
+ "items": subitems,
224
+ }
225
+ )
226
+
227
+ # todo: detect 'checklist':
228
+ """
229
+ type: checklist
230
+ data: {items: [{text: "a", checked: false}, {text: "b", checked: false}, {text: "c", checked: true},…]}
231
+ """
232
+
233
+ if could_be_checklist:
234
+ return [
235
+ {
236
+ "type": "checklist",
237
+ "data": {
238
+ "items": [
239
+ {
240
+ "text": x["content"]
241
+ .removeprefix("[ ] ")
242
+ .removeprefix("[x] "),
243
+ "checked": x["content"].startswith("[x]"),
244
+ }
245
+ for x in items
246
+ ]
247
+ },
248
+ }
249
+ ]
250
+ else:
251
+ return [
252
+ {
253
+ "data": {
254
+ "items": items,
255
+ "style": "ordered" if node.get("ordered") else "unordered",
256
+ },
257
+ "type": "list",
258
+ }
259
+ ]
260
+
261
+ @classmethod
262
+ def to_text(cls, node: MDChildNode) -> str:
263
+ return ""
264
+
265
+
266
+ @block("checklist")
267
+ class ChecklistBlock(ListBlock):
268
+ @classmethod
269
+ def to_markdown(cls, data: EditorChildData) -> str:
270
+ markdown_items = []
271
+
272
+ for item in data.get("items", []):
273
+ text = item.get("text", "").strip()
274
+ char = "x" if item.get("checked", False) else " "
275
+ markdown_items.append(f"- [{char}] {text}")
276
+
277
+ return "\n" + "\n".join(markdown_items) + "\n"
278
+
279
+
280
+ @block("thematicBreak", "delimiter")
281
+ class DelimiterBlock(EditorJSBlock):
282
+ @classmethod
283
+ def to_markdown(cls, data: EditorChildData) -> str:
284
+ return "***\n"
285
+
286
+ @classmethod
287
+ def to_json(cls, node: MDChildNode) -> list[dict]:
288
+ return [
289
+ {
290
+ "type": "delimiter",
291
+ "data": {},
292
+ }
293
+ ]
294
+
295
+ @classmethod
296
+ def to_text(cls, node: MDChildNode) -> str:
297
+ return ""
298
+
299
+
300
+ @block("code")
301
+ class CodeBlock(EditorJSBlock):
302
+ @classmethod
303
+ def to_markdown(cls, data: EditorChildData) -> str:
304
+ code = data.get("code", "")
305
+ return f"```\n" f"{code}" f"\n```\n"
306
+
307
+ @classmethod
308
+ def to_json(cls, node: MDChildNode) -> list[dict]:
309
+ return [
310
+ {
311
+ "data": {"code": cls.to_text(node)},
312
+ "type": "code",
313
+ }
314
+ ]
315
+
316
+ @classmethod
317
+ def to_text(cls, node: MDChildNode) -> str:
318
+ return node.get("value", "")
319
+
320
+
321
+ @block("image")
322
+ class ImageBlock(EditorJSBlock):
323
+ @classmethod
324
+ def to_markdown(cls, data: EditorChildData) -> str:
325
+ url = data.get("url", "") or data.get("file", {}).get("url", "")
326
+ caption = data.get("caption", "")
327
+ return f"""![{caption}]({url} "{caption}")\n"""
328
+
329
+ @classmethod
330
+ def to_json(cls, node: MDChildNode) -> list[dict]:
331
+ return [
332
+ {
333
+ "type": "image",
334
+ "data": {
335
+ "caption": cls.to_text(node),
336
+ "file": {"url": node.get("url")},
337
+ },
338
+ }
339
+ ]
340
+
341
+ @classmethod
342
+ def to_text(cls, node: MDChildNode) -> str:
343
+ return node.get("alt") or node.get("caption") or ""
344
+
345
+
346
+ @block("blockquote", "quote")
347
+ class QuoteBlock(EditorJSBlock):
348
+ re_cite = re.compile(r"<cite>(.+?)<\/cite>")
349
+
350
+ @classmethod
351
+ def to_markdown(cls, data: EditorChildData) -> str:
352
+ text = data.get("text", "")
353
+ result = f"> {text}\n"
354
+ if caption := data.get("caption", ""):
355
+ result += f"> <cite>{caption}</cite>\n"
356
+ return result
357
+
358
+ @classmethod
359
+ def to_json(cls, node: MDChildNode) -> list[dict]:
360
+ caption = ""
361
+ text = cls.to_text(node).replace("\n", "<br/>\n")
362
+
363
+ if cite := re.search(cls.re_cite, text):
364
+ # Capture the value of the first group
365
+ caption = cite.group(1)
366
+ # Remove the <cite>...</cite> tags from the text
367
+ text = re.sub(cls.re_cite, "", text)
368
+
369
+ return [
370
+ {
371
+ "data": {
372
+ "alignment": "left",
373
+ "caption": caption,
374
+ "text": text,
375
+ },
376
+ "type": "quote",
377
+ }
378
+ ]
379
+
380
+ @classmethod
381
+ def to_text(cls, node: MDChildNode) -> str:
382
+ return default_to_text(node)
editorjs/core.py ADDED
@@ -0,0 +1,116 @@
1
+ import json
2
+ import textwrap
3
+ import typing as t
4
+
5
+ import markdown2
6
+ import mdast
7
+ from typing_extensions import Self
8
+
9
+ from .blocks import BLOCKS
10
+ from .exceptions import TODO
11
+ from .helpers import unix_timestamp
12
+ from .types import MDRootNode
13
+
14
+ EDITORJS_VERSION = "2.30.6"
15
+
16
+
17
+ class EditorJS:
18
+ # internal representation is mdast, because we can convert to other types
19
+ _mdast: MDRootNode
20
+
21
+ def __init__(self, _mdast: str | dict, extras: list = ("task_list", "fenced-code-blocks")):
22
+ if not isinstance(_mdast, str | dict):
23
+ raise TypeError("Only `str` or `dict` is supported!")
24
+
25
+ self._mdast = t.cast(
26
+ MDRootNode, json.loads(_mdast) if isinstance(_mdast, str) else _mdast
27
+ )
28
+
29
+ self._md = markdown2.Markdown(extras=extras) # todo: striketrough, table, ?
30
+
31
+ @classmethod
32
+ def from_json(cls, data: str | dict) -> Self:
33
+ """
34
+ Load from EditorJS JSON Blocks
35
+ """
36
+ data = data if isinstance(data, dict) else json.loads(data)
37
+ markdown_items = []
38
+ for child in data["blocks"]:
39
+ _type = child["type"]
40
+ if not (block := BLOCKS.get(_type)):
41
+ raise TypeError(f"Unsupported block type `{_type}`")
42
+
43
+ markdown_items.append(block.to_markdown(child.get("data", {})))
44
+
45
+ markdown = "".join(markdown_items)
46
+ return cls.from_markdown(markdown)
47
+
48
+ @classmethod
49
+ def from_markdown(cls, data: str) -> Self:
50
+ """
51
+ Load from markdown string
52
+ """
53
+
54
+ return cls(mdast.md_to_json(data))
55
+
56
+ @classmethod
57
+ def from_mdast(cls, data: str | dict) -> Self:
58
+ """
59
+ Existing mdast representation
60
+ """
61
+ return cls(data)
62
+
63
+ def to_json(self) -> str:
64
+ """
65
+ Export EditorJS JSON Blocks
66
+ """
67
+ # logic based on https://github.com/carrara88/editorjs-md-parser/blob/main/src/MarkdownImporter.js
68
+ blocks = []
69
+ for child in self._mdast["children"]:
70
+ _type = child["type"]
71
+ if not (block := BLOCKS.get(_type)):
72
+ raise TypeError(f"Unsupported block type `{_type}`")
73
+
74
+ blocks.extend(block.to_json(child))
75
+
76
+ data = {"time": unix_timestamp(), "blocks": blocks, "version": EDITORJS_VERSION}
77
+
78
+ return json.dumps(data)
79
+
80
+ def to_markdown(self) -> str:
81
+ """
82
+ Export Markdown string
83
+ """
84
+ md = mdast.json_to_md(self.to_mdast())
85
+ # idk why this happens:
86
+ md = md.replace(r"\[ ]", "[ ]")
87
+ md = md.replace(r"\[x]", "[x]")
88
+ return md
89
+
90
+ def to_mdast(self) -> str:
91
+ """
92
+ Export mdast representation
93
+ """
94
+ return json.dumps(self._mdast)
95
+
96
+ def to_html(self) -> str:
97
+ """
98
+ Export HTML string
99
+ """
100
+ md = self.to_markdown()
101
+ return self._md.convert(md)
102
+
103
+ def __repr__(self):
104
+ md = self.to_markdown()
105
+ md = md.replace("\n", "\\n")
106
+ return f"EditorJS({md})"
107
+
108
+ def __str__(self):
109
+ return self.to_markdown()
110
+
111
+ # def __eq__(self, other: Self) -> bool:
112
+ # a = self.to_markdown()
113
+ # b = other.to_markdown()
114
+ #
115
+ # remove = string.punctuation + string.whitespace
116
+ # return a.translate(remove) == b.translate(remove)
editorjs/exceptions.py ADDED
@@ -0,0 +1,3 @@
1
+ class TODO(NotImplementedError):
2
+ def __init__(self, msg: str = "todo"):
3
+ super().__init__(msg)
editorjs/helpers.py ADDED
@@ -0,0 +1,5 @@
1
+ import time
2
+
3
+
4
+ def unix_timestamp():
5
+ return round(time.time() * 1000)
editorjs/types.py ADDED
@@ -0,0 +1,43 @@
1
+ import typing as t
2
+
3
+
4
+ class MDPosition(t.TypedDict):
5
+ line: int
6
+ column: int
7
+ offset: int
8
+
9
+
10
+ class MDPositionRange(t.TypedDict):
11
+ start: MDPosition
12
+ end: MDPosition
13
+
14
+
15
+ class MDChildNode(t.TypedDict, total=False):
16
+ type: str # General identifier for node types
17
+ children: list["MDChildNode"] # Recursive children of any node type
18
+ position: MDPositionRange
19
+ value: str # Optional, for nodes like text that hold a value
20
+ depth: int # Optional, for nodes like headings that have a depth
21
+ url: t.NotRequired[str]
22
+
23
+
24
+ class MDRootNode(t.TypedDict):
25
+ type: t.Literal["root"] # Constrains to 'root' for the root node
26
+ children: list[MDChildNode] # Allows any ChildNode type in children
27
+ position: MDPositionRange
28
+
29
+
30
+ class EditorChildData(t.TypedDict, total=False):
31
+ text: str
32
+ items: list["EditorChildNode"]
33
+
34
+
35
+ class EditorChildNode(t.TypedDict):
36
+ type: str
37
+ data: EditorChildData
38
+
39
+
40
+ class EditorRootNode(t.TypedDict):
41
+ time: int
42
+ blocks: list[EditorChildNode]
43
+ version: str
@@ -0,0 +1,28 @@
1
+ Metadata-Version: 2.3
2
+ Name: edwh-editorjs
3
+ Version: 2.0.0b3
4
+ Summary: EditorJS.py
5
+ Project-URL: Homepage, https://github.com/educationwarehouse/edwh-EditorJS
6
+ Author-email: SKevo <skevo.cw@gmail.com>, Robin van der Noord <robin.vdn@educationwarehouse.nl>
7
+ License: MIT
8
+ License-File: LICENSE
9
+ Keywords: bleach,clean,editor,editor.js,html,javascript,json,parser,wysiwyg
10
+ Classifier: Development Status :: 4 - Beta
11
+ Classifier: Intended Audience :: Developers
12
+ Classifier: License :: OSI Approved :: MIT License
13
+ Classifier: Programming Language :: Python :: 3.10
14
+ Classifier: Programming Language :: Python :: 3.11
15
+ Classifier: Programming Language :: Python :: 3.12
16
+ Classifier: Programming Language :: Python :: 3.13
17
+ Requires-Python: >=3.10
18
+ Requires-Dist: markdown2
19
+ Requires-Dist: mdast
20
+ Provides-Extra: dev
21
+ Requires-Dist: edwh; extra == 'dev'
22
+ Requires-Dist: hatch; extra == 'dev'
23
+ Requires-Dist: su6[all]; extra == 'dev'
24
+ Requires-Dist: types-bleach; extra == 'dev'
25
+ Description-Content-Type: text/markdown
26
+
27
+ # edwh-editorjs
28
+
@@ -0,0 +1,11 @@
1
+ editorjs/__about__.py,sha256=TTjbddHImhhMSF_k6S9WFgA-Fcil370fw4WeR8a-eBk,29
2
+ editorjs/__init__.py,sha256=-OHUf7ZXfkbdFB1r85eIjpHRfql-GCNUCKuBEdEt2Rc,58
3
+ editorjs/blocks.py,sha256=WTtzsflkbhkZhjYQ6vZ_6Frl66ZU9uUbWwnX4mGzu4c,11341
4
+ editorjs/core.py,sha256=_mr-WJ2QgB2drgBLnPM38DAPTaxZba--H_EWiQcAZMY,3264
5
+ editorjs/exceptions.py,sha256=TyfHvk2Z5RbKxTDK7lrjgwAgVgInXIuDW63eO5jzVFw,106
6
+ editorjs/helpers.py,sha256=q861o5liNibMTp-Ozay17taF7CTNsRe901lYhhxdwHg,73
7
+ editorjs/types.py,sha256=W7IZWMWgzJaQulybIt0Gx5N63rVj4mEy73VJWo4VAQA,1029
8
+ edwh_editorjs-2.0.0b3.dist-info/METADATA,sha256=QeUtRWqC6v8mGhkm16JoFJ78KhFW0mSEhxHifKTmYjI,1009
9
+ edwh_editorjs-2.0.0b3.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
10
+ edwh_editorjs-2.0.0b3.dist-info/licenses/LICENSE,sha256=zzllbk0pvnmgzk31iq8Zkg0GkA8vVx_Zc3OHjVlTjxo,1101
11
+ edwh_editorjs-2.0.0b3.dist-info/RECORD,,
@@ -1,6 +1,7 @@
1
1
  MIT License
2
2
 
3
3
  Copyright (c) 2021 SKevo
4
+ Copyright (c) 2024 Education Warehouse
4
5
 
5
6
  Permission is hereby granted, free of charge, to any person obtaining a copy
6
7
  of this software and associated documentation files (the "Software"), to deal
@@ -1,104 +0,0 @@
1
- Metadata-Version: 2.3
2
- Name: edwh-editorjs
3
- Version: 2.0.0b1
4
- Summary: pyEditorJS
5
- Project-URL: Homepage, https://github.com/educationwarehouse/edwh-EditorJS
6
- Author-email: SKevo <skevo.cw@gmail.com>, Robin van der Noord <robin.vdn@educationwarehouse.nl>
7
- License: MIT
8
- License-File: LICENSE
9
- Keywords: bleach,clean,editor,editor.js,html,javascript,json,parser,wysiwyg
10
- Classifier: Development Status :: 4 - Beta
11
- Classifier: Intended Audience :: Developers
12
- Classifier: License :: OSI Approved :: MIT License
13
- Classifier: Programming Language :: Python :: 3.10
14
- Classifier: Programming Language :: Python :: 3.11
15
- Classifier: Programming Language :: Python :: 3.12
16
- Classifier: Programming Language :: Python :: 3.13
17
- Requires-Python: >=3.10
18
- Requires-Dist: bleach
19
- Provides-Extra: dev
20
- Requires-Dist: edwh; extra == 'dev'
21
- Requires-Dist: hatch; extra == 'dev'
22
- Requires-Dist: su6[all]; extra == 'dev'
23
- Requires-Dist: types-bleach; extra == 'dev'
24
- Description-Content-Type: text/markdown
25
-
26
- # edwh-editorjs
27
-
28
- A minimal, fast Python 3.10+ package for parsing [Editor.js](https://editorjs.io) content.
29
- This package is a fork of [pyEditorJS by SKevo](https://github.com/SKevo18/pyEditorJS) with additional capabilities.
30
-
31
- ## New Features
32
-
33
- - Expanded support for additional block types: Quote, Table, Code, Warning, and Raw blocks
34
- - Issues a warning if an unknown block type is encountered, rather than ignoring it
35
- - Adds a `strict` mode, raising an `EditorJSUnsupportedBlock` exception for unknown block types when `strict=True`
36
- - Allows adding new blocks by decorating a subclass of `EditorJsParser` with `@block("name")`
37
-
38
- ## Installation
39
-
40
- ```bash
41
- pip install edwh-editorjs
42
- ```
43
-
44
- ## Usage
45
-
46
- ### Quickstart
47
-
48
- ```python
49
- from pyeditorjs import EditorJsParser
50
-
51
- editor_js_data = ... # your Editor.js JSON data
52
- parser = EditorJsParser(editor_js_data) # initialize the parser
53
-
54
- html = parser.html(sanitize=True) # `sanitize=True` uses the included `bleach` dependency
55
- print(html) # your clean HTML
56
- ```
57
-
58
- ### Enforcing Strict Block Types
59
-
60
- ```python
61
- from pyeditorjs import EditorJsParser, EditorJSUnsupportedBlock
62
-
63
- editor_js_data: dict = ...
64
- parser = EditorJsParser(editor_js_data)
65
-
66
- try:
67
- html = parser.html(strict=True)
68
- except EditorJSUnsupportedBlock as e:
69
- print(f"Unsupported block type encountered: {e}")
70
- ```
71
-
72
- ### Adding a Custom Block
73
-
74
- To add a custom block type, create a new class that subclasses `EditorJsBlock` and decorates it with `@block("name")`,
75
- where `"name"` is the custom block type. Implement an `html` method to define how the block’s content should be
76
- rendered. This method should accept a `sanitize` parameter and can access block data via `self.data`.
77
-
78
- ```python
79
- from pyeditorjs import EditorJsParser, EditorJsBlock, block
80
-
81
- @block("custom")
82
- class CustomBlock(EditorJsBlock):
83
- def html(self, sanitize: bool = False) -> str:
84
- # Access data with self.data and return the rendered HTML
85
- content = self.data.get("something", "")
86
- if sanitize:
87
- content = self.sanitize(content)
88
-
89
- return f"<div class='custom-block'>{content}</div>"
90
-
91
- # Usage
92
- class CustomEditorJsParser(EditorJsParser):
93
- pass # Custom blocks are automatically detected
94
-
95
- editor_js_data = ... # Editor.js JSON data with a "customBlock" type
96
- parser = CustomEditorJsParser(editor_js_data)
97
- html = parser.html()
98
- print(html) # Includes rendered custom blocks
99
- ```
100
-
101
- ## Disclaimer
102
-
103
- This is a community-provided project and is not affiliated with the Editor.js team.
104
- Contributions, bug reports, and suggestions are welcome!
@@ -1,9 +0,0 @@
1
- pyeditorjs/__about__.py,sha256=I5vqr3Wm1FBwrGe3laM0fzEEDA_k4QsjCkyWUujPHec,29
2
- pyeditorjs/__init__.py,sha256=63UoNCWJo6NuPXXYnANQE3SKm1PQu2ggs89KCXSq-44,807
3
- pyeditorjs/blocks.py,sha256=4A8dXbh_oUKCctOHtMV6BrR7-UpyqFREPvwPEe_6vUo,8304
4
- pyeditorjs/exceptions.py,sha256=Uni8r3FwJ-6xQIdSmBsHLs_htWLHD0Arp1KJEvjGU1U,439
5
- pyeditorjs/parser.py,sha256=6DCqqi-FuXDFxn9xb-dgQ19alvVu7Pjx6x3rTAx9IsI,2154
6
- edwh_editorjs-2.0.0b1.dist-info/METADATA,sha256=4vIO1CBWAasUZ_JaZzm7E_FSE1s-x3LZeO_4rKfvhec,3521
7
- edwh_editorjs-2.0.0b1.dist-info/WHEEL,sha256=1yFddiXMmvYK7QYTqtRNtX66WJ0Mz8PYEiEUoOUUxRY,87
8
- edwh_editorjs-2.0.0b1.dist-info/licenses/LICENSE,sha256=bY9MhHLeuW8w1aAl-i1O1uSNP5IMOGaL6AWvHcdnt0k,1062
9
- edwh_editorjs-2.0.0b1.dist-info/RECORD,,
pyeditorjs/__about__.py DELETED
@@ -1 +0,0 @@
1
- __version__ = "2.0.0-beta.1"
pyeditorjs/__init__.py DELETED
@@ -1,30 +0,0 @@
1
- from pathlib import Path
2
-
3
- from .blocks import BLOCKS_MAP, EditorJsBlock, block
4
- from .exceptions import EditorJsException, EditorJsParseError, EditorJSUnsupportedBlock
5
- from .parser import EditorJsParser
6
-
7
- __all__ = [
8
- "EditorJsParser",
9
- "EditorJsParseError",
10
- "EditorJsException",
11
- "EditorJSUnsupportedBlock",
12
- "EditorJsBlock",
13
- "block",
14
- "BLOCKS_MAP",
15
- ]
16
-
17
-
18
- # Overwrite __doc__ with README, so that pdoc can render it:
19
- README_PATH = Path(__file__).parent.parent.absolute() / Path("README.md")
20
- try:
21
- with open(README_PATH, "r", encoding="UTF-8") as readme:
22
- __readme__ = readme.read()
23
- except Exception:
24
- __readme__ = "Failed to read README.md!" # fallback message, for example when there's no README
25
-
26
- __doc__ = __readme__
27
-
28
-
29
- if __name__ == "__main__":
30
- _ = [EditorJsParser]
pyeditorjs/blocks.py DELETED
@@ -1,313 +0,0 @@
1
- import abc
2
- import typing as t
3
- from dataclasses import dataclass
4
-
5
- import bleach
6
-
7
- from .exceptions import EditorJsParseError
8
-
9
- __all__ = [
10
- "block",
11
- "BLOCKS_MAP",
12
- "EditorJsBlock",
13
- ]
14
-
15
-
16
- def _sanitize(html: str) -> str:
17
- return bleach.clean(
18
- html,
19
- tags=["b", "i", "u", "a", "mark", "code"],
20
- attributes=["class", "data-placeholder", "href"],
21
- )
22
-
23
-
24
- BLOCKS_MAP: t.Dict[str, t.Type["EditorJsBlock"]] = {
25
- # 'header': HeaderBlock,
26
- # 'paragraph': ParagraphBlock,
27
- # 'list': ListBlock,
28
- # 'delimiter': DelimiterBlock,
29
- # 'image': ImageBlock,
30
- }
31
-
32
-
33
- def block(_type: str):
34
- def wrapper(cls: t.Type["EditorJsBlock"]):
35
- BLOCKS_MAP[_type] = cls
36
- return cls
37
-
38
- return wrapper
39
-
40
-
41
- @dataclass
42
- class EditorJsBlock(abc.ABC):
43
- """
44
- A generic parsed Editor.js block
45
- """
46
-
47
- _data: dict
48
- """The raw JSON data of the entire block"""
49
-
50
- @classmethod
51
- def sanitize(cls, html: str) -> str:
52
- return _sanitize(html)
53
-
54
- @property
55
- def id(self) -> t.Optional[str]:
56
- """
57
- Returns ID of the block, generated client-side.
58
- """
59
-
60
- return self._data.get("id", None)
61
-
62
- @property
63
- def type(self) -> t.Optional[str]:
64
- """
65
- Returns the type of the block.
66
- """
67
-
68
- return self._data.get("type", None)
69
-
70
- @property
71
- def data(self) -> dict:
72
- """
73
- Returns the actual block data.
74
- """
75
-
76
- return self._data.get("data", {})
77
-
78
- @abc.abstractmethod
79
- def html(self, sanitize: bool = False) -> str:
80
- """
81
- Returns the HTML representation of the block.
82
-
83
- ### Parameters:
84
- - `sanitize` - if `True`, then the block's text/contents will be sanitized.
85
- """
86
-
87
- raise NotImplementedError()
88
-
89
-
90
- @block("header")
91
- class HeaderBlock(EditorJsBlock):
92
- VALID_HEADER_LEVEL_RANGE = range(1, 7)
93
- """Valid range for header levels. Default is `range(1, 7)` - so, `0` - `6`."""
94
-
95
- @property
96
- def text(self) -> str:
97
- """
98
- Returns the header's text.
99
- """
100
-
101
- return self.data.get("text", "")
102
-
103
- @property
104
- def level(self) -> int:
105
- """
106
- Returns the header's level (`0` - `6`).
107
- """
108
-
109
- _level = self.data.get("level", 1)
110
-
111
- if not isinstance(_level, int) or _level not in self.VALID_HEADER_LEVEL_RANGE:
112
- raise EditorJsParseError(f"`{_level}` is not a valid header level.")
113
-
114
- return _level
115
-
116
- def html(self, sanitize: bool = False) -> str:
117
- text = self.text
118
- if sanitize:
119
- text = _sanitize(text)
120
- return rf'<h{self.level} class="cdx-block ce-header">{text}</h{self.level}>'
121
-
122
-
123
- @block("paragraph")
124
- class ParagraphBlock(EditorJsBlock):
125
- @property
126
- def text(self) -> str:
127
- """
128
- The text content of the paragraph.
129
- """
130
-
131
- return self.data.get("text", "")
132
-
133
- def html(self, sanitize: bool = False) -> str:
134
- return rf'<p class="cdx-block ce-paragraph">{_sanitize(self.text) if sanitize else self.text}</p>'
135
-
136
-
137
- @block("list")
138
- class ListBlock(EditorJsBlock):
139
- VALID_STYLES = ("unordered", "ordered")
140
- """Valid list order styles."""
141
-
142
- @property
143
- def style(self) -> t.Optional[str]:
144
- """
145
- The style of the list. Can be `ordered` or `unordered`.
146
- """
147
-
148
- return self.data.get("style", None)
149
-
150
- @property
151
- def items(self) -> t.List[str]:
152
- """
153
- Returns the list's items, in raw format.
154
- """
155
-
156
- return self.data.get("items", [])
157
-
158
- def html(self, sanitize: bool = False) -> str:
159
- if self.style not in self.VALID_STYLES:
160
- raise EditorJsParseError(f"`{self.style}` is not a valid list style.")
161
-
162
- _items = [
163
- f"<li>{_sanitize(item) if sanitize else item}</li>" for item in self.items
164
- ]
165
- _type = "ul" if self.style == "unordered" else "ol"
166
- _items_html = "".join(_items)
167
-
168
- return rf'<{_type} class="cdx-block cdx-list cdx-list--{self.style}">{_items_html}</{_type}>'
169
-
170
-
171
- @block("delimiter")
172
- class DelimiterBlock(EditorJsBlock):
173
- def html(self, sanitize: bool = False) -> str:
174
- return r'<div class="cdx-block ce-delimiter"></div>'
175
-
176
-
177
- @block("image")
178
- class ImageBlock(EditorJsBlock):
179
- @property
180
- def file_url(self) -> str:
181
- """
182
- URL of the image file.
183
- """
184
-
185
- return self.data.get("file", {}).get("url", "")
186
-
187
- @property
188
- def caption(self) -> str:
189
- """
190
- The image's caption.
191
- """
192
-
193
- return self.data.get("caption", "")
194
-
195
- @property
196
- def with_border(self) -> bool:
197
- """
198
- Whether the image has a border.
199
- """
200
-
201
- return self.data.get("withBorder", False)
202
-
203
- @property
204
- def stretched(self) -> bool:
205
- """
206
- Whether the image is stretched.
207
- """
208
-
209
- return self.data.get("stretched", False)
210
-
211
- @property
212
- def with_background(self) -> bool:
213
- """
214
- Whether the image has a background.
215
- """
216
-
217
- return self.data.get("withBackground", False)
218
-
219
- def html(self, sanitize: bool = False) -> str:
220
- if self.file_url.startswith("data:image/"):
221
- _img = self.file_url
222
- else:
223
- _img = _sanitize(self.file_url) if sanitize else self.file_url
224
-
225
- parts = [
226
- rf'<div class="cdx-block image-tool image-tool--filled {"image-tool--stretched" if self.stretched else ""} {"image-tool--withBorder" if self.with_border else ""} {"image-tool--withBackground" if self.with_background else ""}">'
227
- r'<div class="image-tool__image">',
228
- r'<div class="image-tool__image-preloader"></div>',
229
- rf'<img class="image-tool__image-picture" src="{_img}"/>',
230
- r"</div>"
231
- rf'<div class="image-tool__caption" data-placeholder="{_sanitize(self.caption) if sanitize else self.caption}"></div>'
232
- r"</div>"
233
- r"</div>",
234
- ]
235
-
236
- return "".join(parts)
237
-
238
-
239
- @block("quote")
240
- class QuoteBlock(EditorJsBlock):
241
- def html(self, sanitize: bool = False) -> str:
242
- quote = self.data.get("text", "")
243
- caption = self.data.get("caption", "")
244
- if sanitize:
245
- quote = _sanitize(quote)
246
- caption = _sanitize(caption)
247
- _alignment = self.data.get("alignment", "left") # todo
248
- return f"""
249
- <blockquote class="cdx-block cdx-quote">
250
- <div class="cdx-input cdx-quote__text">{quote}</div>
251
- <cite class="cdx-input cdx-quote__caption">{caption}</cite>
252
- </blockquote>
253
- """
254
-
255
-
256
- @block("table")
257
- class TableBlock(EditorJsBlock):
258
- def html(self, sanitize: bool = False) -> str:
259
- content = self.data.get("content", [])
260
- _stretched = self.data.get("stretched", False) # todo
261
- _with_headings = self.data.get("withHeadings", False) # todo
262
-
263
- html_table = '<table class="tc-table">'
264
-
265
- # Add content rows
266
- for row in content:
267
- html_table += '<tr class="tc-row">'
268
- for cell in row:
269
- html_table += (
270
- f'<td class="tc-cell">{_sanitize(cell) if sanitize else cell}</td>'
271
- )
272
- html_table += "</tr>"
273
-
274
- html_table += "</table>"
275
- return html_table
276
-
277
-
278
- @block("code")
279
- class CodeBlock(EditorJsBlock):
280
- def html(self, sanitize: bool = False) -> str:
281
- code = self.data.get("code", "")
282
- if sanitize:
283
- code = _sanitize(code)
284
- return f"""
285
- <code class="ce-code__textarea cdx-input" data-empty="false">{code}</code>
286
- """
287
-
288
-
289
- @block("warning")
290
- class WarningBlock(EditorJsBlock):
291
- def html(self, sanitize: bool = False) -> str:
292
- title = self.data.get("title", "")
293
- message = self.data.get("message", "")
294
-
295
- if sanitize:
296
- title = _sanitize(title)
297
- message = _sanitize(message)
298
-
299
- return f"""
300
- <div class="cdx-block cdx-warning">
301
- <div class="cdx-input cdx-warning__title">{title}</div>
302
- <div class="cdx-input cdx-warning__message">{message}</div>
303
- </div>
304
- """
305
-
306
-
307
- @block("raw")
308
- class RawBlock(EditorJsBlock):
309
- def html(self, sanitize: bool = False) -> str:
310
- html = self.data.get("html", "")
311
- if sanitize:
312
- html = _sanitize(html)
313
- return html
pyeditorjs/exceptions.py DELETED
@@ -1,19 +0,0 @@
1
- __all__ = [
2
- "EditorJsException",
3
- "EditorJsParseError",
4
- "EditorJSUnsupportedBlock",
5
- ]
6
-
7
-
8
- class EditorJsException(Exception):
9
- """
10
- Base exception
11
- """
12
-
13
-
14
- class EditorJsParseError(EditorJsException):
15
- """Raised when a parse error occurs (example: the JSON data has invalid or malformed content)."""
16
-
17
-
18
- class EditorJSUnsupportedBlock(EditorJsException):
19
- """Raised when strict=True and using an unknown block type."""
pyeditorjs/parser.py DELETED
@@ -1,75 +0,0 @@
1
- import typing as t
2
- import warnings
3
- from dataclasses import dataclass
4
-
5
- from .blocks import BLOCKS_MAP, EditorJsBlock
6
- from .exceptions import EditorJsParseError, EditorJSUnsupportedBlock
7
-
8
-
9
- @dataclass
10
- class EditorJsParser:
11
- """
12
- An Editor.js parser.
13
- """
14
-
15
- content: dict
16
- """The JSON data of Editor.js content."""
17
-
18
- def __post_init__(self) -> None:
19
- if not isinstance(self.content, dict):
20
- raise EditorJsParseError(
21
- f"Content must be `dict`, not {type(self.content).__name__}"
22
- )
23
-
24
- @staticmethod
25
- def _get_block(data: dict, strict: bool = False) -> t.Optional[EditorJsBlock]:
26
- """
27
- Obtains block instance from block data.
28
- """
29
-
30
- _type = data.get("type", None)
31
-
32
- if _type not in BLOCKS_MAP:
33
- if strict:
34
- raise EditorJSUnsupportedBlock(_type)
35
- else:
36
- warnings.warn(f"Unsupported block: {_type}", category=RuntimeWarning)
37
- return None
38
-
39
- return BLOCKS_MAP[_type](_data=data)
40
-
41
- def blocks(self, strict: bool = False) -> list[EditorJsBlock]:
42
- """
43
- Obtains a list of all available blocks from the editor's JSON data.
44
- """
45
-
46
- all_blocks: list[EditorJsBlock] = []
47
- blocks = self.content.get("blocks", [])
48
-
49
- if not isinstance(blocks, list):
50
- raise EditorJsParseError(
51
- f"Blocks is not `list`, but `{type(blocks).__name__}`"
52
- )
53
-
54
- for block_data in blocks:
55
- if block := self._get_block(data=block_data, strict=strict):
56
- all_blocks.append(block)
57
-
58
- return all_blocks
59
-
60
- def __iter__(self) -> t.Iterator[EditorJsBlock]:
61
- """Returns `iter(self.blocks())`"""
62
-
63
- return iter(self.blocks())
64
-
65
- def html(self, sanitize: bool = False, strict: bool = False) -> str:
66
- """
67
- Renders the editor's JSON content as HTML.
68
-
69
- ### Parameters:
70
- - `sanitize` - whether to also sanitize the blocks' texts/contents.
71
- """
72
-
73
- return "\n".join(
74
- [block.html(sanitize=sanitize) for block in self.blocks(strict=strict)]
75
- )